{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "01fa4731",
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import pandas as pd\n",
    "from PIL import Image\n",
    "import os\n",
    "import cv2\n",
    "import numpy as np\n",
    "import pandas as pd\n",
    "from matplotlib import pyplot as plt\n",
    "import skimage.metrics\n",
    "from sklearn.feature_extraction.text import CountVectorizer\n",
    "import pytesseract\n",
    "pytesseract.pytesseract.tesseract_cmd = r'C:\\Program Files\\Tesseract-OCR\\tesseract.exe' # https://stackoverflow.com/questions/50951955/pytesseract-tesseractnotfound-error-tesseract-is-not-installed-or-its-not-i\n",
    "from numpy.linalg import norm\n",
    "from tensorflow.keras.applications.resnet50 import ResNet50,preprocess_input\n",
    "from tensorflow.keras.preprocessing import image\n",
    "from tqdm.auto import tqdm"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "9c988bae",
   "metadata": {
    "scrolled": true,
    "tags": []
   },
   "outputs": [],
   "source": [
    "# Import list of cities and forms (removing redacted BIT cities)\n",
    "forms_data = pd.read_stata('data/FormsSim.dta')\n",
    "forms_data = forms_data[forms_data['city']!='[REDACTED]']\n",
    "forms_data.reset_index(inplace=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "b4ab0d17",
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "def sim(path1, path2):   \n",
    "    # Import the two images\n",
    "    image1 = cv2.imread(path1)\n",
    "    image2 = cv2.imread(path2)\n",
    "        \n",
    "    ## GRAPHIC SIMILARITY\n",
    "    # Get the width and height of images\n",
    "    width1, height1 = image1.shape[1], image1.shape[0]\n",
    "    width2, height2 = image2.shape[1], image2.shape[0]\n",
    "    \n",
    "    # Resize if above max dimensions that can be processed\n",
    "    if width1>32676 or height1>32676:\n",
    "        max_dim1=max(width1,height1)\n",
    "        res_fac1=32676/max_dim1\n",
    "        new_width1=round(width1*res_fac1)\n",
    "        new_height1=round(height1*res_fac1)\n",
    "        image1=cv2.resize(image1, (new_width1, new_height1))\n",
    "    if width2>32676 or height2>32676:\n",
    "        max_dim2=max(width2,height2)\n",
    "        res_fac2=32676/max_dim2\n",
    "        new_width2=round(width2*res_fac2)\n",
    "        new_height2=round(height2*res_fac2)\n",
    "        image2=cv2.resize(image2, (new_width2, new_height2))\n",
    "    \n",
    "    ## TEXT SIMILARITY\n",
    "    # Perform OCR on images\n",
    "    text1 = pytesseract.image_to_string(image1)\n",
    "    text2 = pytesseract.image_to_string(image2)\n",
    "    \n",
    "    # Vectorize strings\n",
    "    vectorizer = CountVectorizer(strip_accents='unicode') \n",
    "    [text1_vec, text2_vec] = vectorizer.fit_transform([text1,text2])\n",
    "\n",
    "    # Save vectorized strings in array format\n",
    "    [text1_vec_array, text2_vec_array] = [text1_vec.toarray(), text2_vec.toarray()] # Counts for word freq in each image\n",
    "    features = np.array([vectorizer.get_feature_names_out()]) # \"Dictionary\" for the array counts\n",
    "\n",
    "    # Keep only the words that appear at least 2 times across the two images\n",
    "    text_vec_array = text1_vec_array + text2_vec_array # Counts for word freq in BOTH images\n",
    "    [text1_vec_array_gt1, text2_vec_array_gt1] = [text1_vec_array[text_vec_array>1], text2_vec_array[text_vec_array>1]] # Subset words that appear >1 times\n",
    "    features_gt1 = features[text_vec_array>1] # Subset dictionary for words that appear >1 times\n",
    "\n",
    "    # Calculate textual cosine similarity\n",
    "    cos_gfx_sim = np.dot(text1_vec_array_gt1, text2_vec_array_gt1) / (np.linalg.norm(text1_vec_array_gt1) * np.linalg.norm(text2_vec_array_gt1))\n",
    "\n",
    "    # Calculate graphical cosine similarity\n",
    "    def return_image_embedding(model,img_path):\n",
    "        img = image.load_img(img_path, target_size=(224, 224))\n",
    "        x = image.img_to_array(img)\n",
    "        x = np.expand_dims(x, axis=0)\n",
    "        x = preprocess_input(x)\n",
    "        preds = model.predict(x)\n",
    "        curr_df = pd.DataFrame(preds[0]).T\n",
    "        return curr_df\n",
    "    model = ResNet50(include_top=False, weights='imagenet', pooling='avg')\n",
    "    img1_embedding = return_image_embedding(model, path1)\n",
    "    img2_embedding = return_image_embedding(model, path2)\n",
    "    img1_array = img1_embedding.to_numpy()\n",
    "    img2_array = img2_embedding.to_numpy()\n",
    "    cos_txt_sim = np.dot(img1_array,img2_array.T)[0][0]/(norm(img1_array)*norm(img2_array))\n",
    "    \n",
    "    return cos_txt_sim, cos_gfx_sim"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "d71ac2a8",
   "metadata": {
    "scrolled": true,
    "tags": []
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "PHILADELPHIA\n",
      "Homestead Exemption Application\n",
      "2015\n",
      "2020\n",
      "1/1 [==============================] - 1s 769ms/step\n",
      "1/1 [==============================] - 0s 79ms/step\n",
      "PHILADELPHIA\n",
      "Homestead Exemption Application\n",
      "2020\n",
      "2023\n",
      "1/1 [==============================] - 1s 631ms/step\n",
      "1/1 [==============================] - 0s 93ms/step\n",
      "SANANTONIO\n",
      "PD Property Loss Report\n",
      "2015\n",
      "2016\n",
      "1/1 [==============================] - 1s 567ms/step\n",
      "1/1 [==============================] - 0s 82ms/step\n",
      "SANANTONIO\n",
      "Fire Drill Requirements\n",
      "2017\n",
      "2020\n",
      "1/1 [==============================] - 1s 577ms/step\n",
      "1/1 [==============================] - 0s 91ms/step\n",
      "SANANTONIO\n",
      "Fire Drill Requirements\n",
      "2015\n",
      "2016\n",
      "WARNING:tensorflow:5 out of the last 9 calls to <function Model.make_predict_function.<locals>.predict_function at 0x000001A3812D9E10> triggered tf.function retracing. Tracing is expensive and the excessive number of tracings could be due to (1) creating @tf.function repeatedly in a loop, (2) passing tensors with different shapes, (3) passing Python objects instead of tensors. For (1), please define your @tf.function outside of the loop. For (2), @tf.function has reduce_retracing=True option that can avoid unnecessary retracing. For (3), please refer to https://www.tensorflow.org/guide/function#controlling_retracing and https://www.tensorflow.org/api_docs/python/tf/function for  more details.\n",
      "1/1 [==============================] - 1s 810ms/step\n",
      "1/1 [==============================] - 0s 97ms/step\n",
      "SANANTONIO\n",
      "Fire Drill Requirements\n",
      "2021\n",
      "2023\n",
      "WARNING:tensorflow:6 out of the last 11 calls to <function Model.make_predict_function.<locals>.predict_function at 0x000001A3812DA440> triggered tf.function retracing. Tracing is expensive and the excessive number of tracings could be due to (1) creating @tf.function repeatedly in a loop, (2) passing tensors with different shapes, (3) passing Python objects instead of tensors. For (1), please define your @tf.function outside of the loop. For (2), @tf.function has reduce_retracing=True option that can avoid unnecessary retracing. For (3), please refer to https://www.tensorflow.org/guide/function#controlling_retracing and https://www.tensorflow.org/api_docs/python/tf/function for  more details.\n",
      "1/1 [==============================] - 1s 645ms/step\n",
      "1/1 [==============================] - 0s 98ms/step\n",
      "SANANTONIO\n",
      "Fire Drill Requirements\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 629ms/step\n",
      "1/1 [==============================] - 0s 97ms/step\n",
      "SANANTONIO\n",
      "PD Property Loss Report\n",
      "2020\n",
      "2021\n",
      "1/1 [==============================] - 1s 643ms/step\n",
      "1/1 [==============================] - 0s 110ms/step\n",
      "SANANTONIO\n",
      "PD Property Loss Report\n",
      "2021\n",
      "2023\n",
      "1/1 [==============================] - 1s 637ms/step\n",
      "1/1 [==============================] - 0s 111ms/step\n",
      "SANANTONIO\n",
      "Fire Drill Requirements\n",
      "2020\n",
      "2021\n",
      "1/1 [==============================] - 1s 736ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "SANANTONIO\n",
      "PD Property Loss Report\n",
      "2016\n",
      "2020\n",
      "1/1 [==============================] - 1s 644ms/step\n",
      "1/1 [==============================] - 0s 112ms/step\n",
      "SANDIEGO\n",
      "Business Finance Loan Application\n",
      "2022\n",
      "2023\n",
      "1/1 [==============================] - 1s 740ms/step\n",
      "1/1 [==============================] - 0s 93ms/step\n",
      "SANDIEGO\n",
      "Study Guide Police Written Test\n",
      "2018\n",
      "2019\n",
      "1/1 [==============================] - 1s 655ms/step\n",
      "1/1 [==============================] - 0s 97ms/step\n",
      "SANDIEGO\n",
      "Police Ride Along Request\n",
      "2018\n",
      "2019\n",
      "1/1 [==============================] - 1s 643ms/step\n",
      "1/1 [==============================] - 0s 110ms/step\n",
      "SANDIEGO\n",
      "Business Finance Loan Application\n",
      "2015\n",
      "2016\n",
      "1/1 [==============================] - 1s 635ms/step\n",
      "1/1 [==============================] - 0s 97ms/step\n",
      "SANDIEGO\n",
      "Citizen's Request Vacation House Check\n",
      "2015\n",
      "2016\n",
      "1/1 [==============================] - 1s 638ms/step\n",
      "1/1 [==============================] - 0s 114ms/step\n",
      "SANDIEGO\n",
      "Business Finance Loan Application\n",
      "2018\n",
      "2019\n",
      "1/1 [==============================] - 1s 691ms/step\n",
      "1/1 [==============================] - 0s 98ms/step\n",
      "SANDIEGO\n",
      "Study Guide Police Written Test\n",
      "2017\n",
      "2018\n",
      "1/1 [==============================] - 1s 645ms/step\n",
      "1/1 [==============================] - 0s 152ms/step\n",
      "SANDIEGO\n",
      "Business Finance Loan Application\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 849ms/step\n",
      "1/1 [==============================] - 0s 94ms/step\n",
      "SANDIEGO\n",
      "Citizen's Request Vacation House Check\n",
      "2020\n",
      "2021\n",
      "1/1 [==============================] - 1s 645ms/step\n",
      "1/1 [==============================] - 0s 111ms/step\n",
      "SANDIEGO\n",
      "Police Ride Along Request\n",
      "2020\n",
      "2021\n",
      "1/1 [==============================] - 1s 838ms/step\n",
      "1/1 [==============================] - 0s 129ms/step\n",
      "SANDIEGO\n",
      "Study Guide Police Written Test\n",
      "2021\n",
      "2022\n",
      "1/1 [==============================] - 1s 633ms/step\n",
      "1/1 [==============================] - 0s 94ms/step\n",
      "SANDIEGO\n",
      "Police Ride Along Request\n",
      "2019\n",
      "2020\n",
      "1/1 [==============================] - 1s 606ms/step\n",
      "1/1 [==============================] - 0s 97ms/step\n",
      "SANDIEGO\n",
      "Police Ride Along Request\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 759ms/step\n",
      "1/1 [==============================] - 0s 124ms/step\n",
      "SANDIEGO\n",
      "Police Ride Along Request\n",
      "2015\n",
      "2016\n",
      "1/1 [==============================] - 1s 622ms/step\n",
      "1/1 [==============================] - 0s 107ms/step\n",
      "SANDIEGO\n",
      "Study Guide Police Written Test\n",
      "2022\n",
      "2023\n",
      "1/1 [==============================] - 1s 600ms/step\n",
      "1/1 [==============================] - 0s 88ms/step\n",
      "SANDIEGO\n",
      "Citizen's Request Vacation House Check\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 619ms/step\n",
      "1/1 [==============================] - 0s 99ms/step\n",
      "SANDIEGO\n",
      "Business Finance Loan Application\n",
      "2020\n",
      "2021\n",
      "1/1 [==============================] - 1s 600ms/step\n",
      "1/1 [==============================] - 0s 88ms/step\n",
      "SANDIEGO\n",
      "Police Ride Along Request\n",
      "2021\n",
      "2022\n",
      "1/1 [==============================] - 1s 600ms/step\n",
      "1/1 [==============================] - 0s 100ms/step\n",
      "SANDIEGO\n",
      "Business Finance Loan Application\n",
      "2019\n",
      "2020\n",
      "1/1 [==============================] - 1s 649ms/step\n",
      "1/1 [==============================] - 0s 93ms/step\n",
      "SANDIEGO\n",
      "Citizen's Request Vacation House Check\n",
      "2021\n",
      "2022\n",
      "1/1 [==============================] - 1s 709ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "SANDIEGO\n",
      "Citizen's Request Vacation House Check\n",
      "2019\n",
      "2020\n",
      "1/1 [==============================] - 1s 687ms/step\n",
      "1/1 [==============================] - 0s 107ms/step\n",
      "SANDIEGO\n",
      "Citizen's Request Vacation House Check\n",
      "2017\n",
      "2018\n",
      "1/1 [==============================] - 1s 654ms/step\n",
      "1/1 [==============================] - 0s 104ms/step\n",
      "SANDIEGO\n",
      "Citizen's Request Vacation House Check\n",
      "2022\n",
      "2023\n",
      "1/1 [==============================] - 1s 639ms/step\n",
      "1/1 [==============================] - 0s 99ms/step\n",
      "SANDIEGO\n",
      "Citizen's Request Vacation House Check\n",
      "2018\n",
      "2019\n",
      "1/1 [==============================] - 1s 648ms/step\n",
      "1/1 [==============================] - 0s 99ms/step\n",
      "SANDIEGO\n",
      "Study Guide Police Written Test\n",
      "2020\n",
      "2021\n",
      "1/1 [==============================] - 1s 560ms/step\n",
      "1/1 [==============================] - 0s 82ms/step\n",
      "SANDIEGO\n",
      "Business Finance Loan Application\n",
      "2021\n",
      "2022\n",
      "1/1 [==============================] - 1s 651ms/step\n",
      "1/1 [==============================] - 0s 105ms/step\n",
      "SANDIEGO\n",
      "Police Ride Along Request\n",
      "2022\n",
      "2023\n",
      "1/1 [==============================] - 1s 656ms/step\n",
      "1/1 [==============================] - 0s 104ms/step\n",
      "SANDIEGO\n",
      "Study Guide Police Written Test\n",
      "2015\n",
      "2016\n",
      "1/1 [==============================] - 1s 641ms/step\n",
      "1/1 [==============================] - 0s 88ms/step\n",
      "SANDIEGO\n",
      "Study Guide Police Written Test\n",
      "2019\n",
      "2020\n",
      "1/1 [==============================] - 1s 645ms/step\n",
      "1/1 [==============================] - 0s 95ms/step\n",
      "SANDIEGO\n",
      "Study Guide Police Written Test\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 615ms/step\n",
      "1/1 [==============================] - 0s 94ms/step\n",
      "SANDIEGO\n",
      "Police Ride Along Request\n",
      "2017\n",
      "2018\n",
      "1/1 [==============================] - 1s 646ms/step\n",
      "1/1 [==============================] - 0s 119ms/step\n",
      "SANDIEGO\n",
      "Business Finance Loan Application\n",
      "2017\n",
      "2018\n",
      "1/1 [==============================] - 1s 567ms/step\n",
      "1/1 [==============================] - 0s 86ms/step\n",
      "DALLAS\n",
      "Vehicle Hangtag Application\n",
      "2020\n",
      "2022\n",
      "1/1 [==============================] - 1s 605ms/step\n",
      "1/1 [==============================] - 0s 99ms/step\n",
      "DALLAS\n",
      "Court Records Request\n",
      "2020\n",
      "2023\n",
      "1/1 [==============================] - 1s 619ms/step\n",
      "1/1 [==============================] - 0s 97ms/step\n",
      "DALLAS\n",
      "Report of Theft\n",
      "2017\n",
      "2021\n",
      "1/1 [==============================] - 1s 633ms/step\n",
      "1/1 [==============================] - 0s 122ms/step\n",
      "DALLAS\n",
      "Vehicle Hangtag Application\n",
      "2022\n",
      "2023\n",
      "1/1 [==============================] - 1s 725ms/step\n",
      "1/1 [==============================] - 0s 137ms/step\n",
      "DALLAS\n",
      "Citizen's Fire Academy Release Form\n",
      "2016\n",
      "2018\n",
      "1/1 [==============================] - 1s 647ms/step\n",
      "1/1 [==============================] - 0s 113ms/step\n",
      "DALLAS\n",
      "Report of Theft\n",
      "2021\n",
      "2023\n",
      "1/1 [==============================] - 1s 635ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "DALLAS\n",
      "Court Records Request\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 659ms/step\n",
      "1/1 [==============================] - 0s 106ms/step\n",
      "DALLAS\n",
      "Report of Theft\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 757ms/step\n",
      "1/1 [==============================] - 0s 111ms/step\n",
      "DALLAS\n",
      "Citizen's Fire Academy Release Form\n",
      "2015\n",
      "2016\n",
      "1/1 [==============================] - 1s 647ms/step\n",
      "1/1 [==============================] - 0s 115ms/step\n",
      "DALLAS\n",
      "Report of Theft\n",
      "2015\n",
      "2016\n",
      "1/1 [==============================] - 1s 637ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "DALLAS\n",
      "Vehicle Hangtag Application\n",
      "2018\n",
      "2020\n",
      "1/1 [==============================] - 1s 669ms/step\n",
      "1/1 [==============================] - 0s 126ms/step\n",
      "DALLAS\n",
      "Citizen's Fire Academy Release Form\n",
      "2019\n",
      "2023\n",
      "1/1 [==============================] - 1s 648ms/step\n",
      "1/1 [==============================] - 0s 109ms/step\n",
      "DALLAS\n",
      "Court Records Request\n",
      "2017\n",
      "2020\n",
      "1/1 [==============================] - 1s 693ms/step\n",
      "1/1 [==============================] - 0s 110ms/step\n",
      "DALLAS\n",
      "Citizen's Fire Academy Release Form\n",
      "2018\n",
      "2019\n",
      "1/1 [==============================] - 1s 680ms/step\n",
      "1/1 [==============================] - 0s 101ms/step\n",
      "AUSTIN\n",
      "Deferred Disposition Request\n",
      "2017\n",
      "2019\n",
      "1/1 [==============================] - 1s 832ms/step\n",
      "1/1 [==============================] - 0s 138ms/step\n",
      "AUSTIN\n",
      "Citizen Police Academy Disqualifiers\n",
      "2022\n",
      "2023\n",
      "1/1 [==============================] - 1s 656ms/step\n",
      "1/1 [==============================] - 0s 113ms/step\n",
      "AUSTIN\n",
      "Home Fire Hazard Checklist\n",
      "2015\n",
      "2016\n",
      "1/1 [==============================] - 1s 662ms/step\n",
      "1/1 [==============================] - 0s 109ms/step\n",
      "AUSTIN\n",
      "Affordable Parking Program Application\n",
      "2022\n",
      "2023\n",
      "1/1 [==============================] - 1s 739ms/step\n",
      "1/1 [==============================] - 0s 105ms/step\n",
      "AUSTIN\n",
      "Affordable Parking Program Application\n",
      "2020\n",
      "2021\n",
      "1/1 [==============================] - 1s 670ms/step\n",
      "1/1 [==============================] - 0s 105ms/step\n",
      "AUSTIN\n",
      "Citizen Police Academy Disqualifiers\n",
      "2021\n",
      "2022\n",
      "1/1 [==============================] - 1s 647ms/step\n",
      "1/1 [==============================] - 0s 115ms/step\n",
      "AUSTIN\n",
      "Citizen Police Academy Disqualifiers\n",
      "2020\n",
      "2021\n",
      "1/1 [==============================] - 1s 721ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "AUSTIN\n",
      "Affordable Parking Program Application\n",
      "2018\n",
      "2020\n",
      "1/1 [==============================] - 1s 664ms/step\n",
      "1/1 [==============================] - 0s 106ms/step\n",
      "AUSTIN\n",
      "Home Fire Hazard Checklist\n",
      "2018\n",
      "2020\n",
      "1/1 [==============================] - 1s 643ms/step\n",
      "1/1 [==============================] - 0s 106ms/step\n",
      "AUSTIN\n",
      "Home Fire Hazard Checklist\n",
      "2020\n",
      "2021\n",
      "1/1 [==============================] - 1s 653ms/step\n",
      "1/1 [==============================] - 0s 101ms/step\n",
      "AUSTIN\n",
      "Deferred Disposition Request\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 633ms/step\n",
      "1/1 [==============================] - 0s 102ms/step\n",
      "AUSTIN\n",
      "Citizen Police Academy Disqualifiers\n",
      "2015\n",
      "2016\n",
      "1/1 [==============================] - 1s 639ms/step\n",
      "1/1 [==============================] - 0s 122ms/step\n",
      "AUSTIN\n",
      "Citizen Police Academy Disqualifiers\n",
      "2019\n",
      "2020\n",
      "1/1 [==============================] - 1s 839ms/step\n",
      "1/1 [==============================] - 0s 135ms/step\n",
      "AUSTIN\n",
      "Home Fire Hazard Checklist\n",
      "2021\n",
      "2022\n",
      "1/1 [==============================] - 1s 708ms/step\n",
      "1/1 [==============================] - 0s 108ms/step\n",
      "AUSTIN\n",
      "Home Fire Hazard Checklist\n",
      "2022\n",
      "2023\n",
      "1/1 [==============================] - 1s 681ms/step\n",
      "1/1 [==============================] - 0s 100ms/step\n",
      "AUSTIN\n",
      "Citizen Police Academy Disqualifiers\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 846ms/step\n",
      "1/1 [==============================] - 0s 130ms/step\n",
      "AUSTIN\n",
      "Affordable Parking Program Application\n",
      "2021\n",
      "2022\n",
      "1/1 [==============================] - 1s 647ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "AUSTIN\n",
      "Deferred Disposition Request\n",
      "2019\n",
      "2020\n",
      "1/1 [==============================] - 1s 646ms/step\n",
      "1/1 [==============================] - 0s 100ms/step\n",
      "AUSTIN\n",
      "Citizen Police Academy Disqualifiers\n",
      "2017\n",
      "2019\n",
      "1/1 [==============================] - 1s 818ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "AUSTIN\n",
      "Home Fire Hazard Checklist\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 636ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "AUSTIN\n",
      "Home Fire Hazard Checklist\n",
      "2017\n",
      "2018\n",
      "1/1 [==============================] - 1s 643ms/step\n",
      "1/1 [==============================] - 0s 116ms/step\n",
      "SANFRANCISCO\n",
      "Permit Application\n",
      "2019\n",
      "2023\n",
      "1/1 [==============================] - 1s 652ms/step\n",
      "1/1 [==============================] - 0s 114ms/step\n",
      "SANFRANCISCO\n",
      "Permit Application\n",
      "2015\n",
      "2019\n",
      "1/1 [==============================] - 1s 639ms/step\n",
      "1/1 [==============================] - 0s 99ms/step\n",
      "SEATTLE\n",
      "Ethics Code Commissions Board\n",
      "2017\n",
      "2018\n",
      "1/1 [==============================] - 1s 650ms/step\n",
      "1/1 [==============================] - 0s 99ms/step\n",
      "SEATTLE\n",
      "Ethics Code Commissions Board\n",
      "2020\n",
      "2021\n",
      "1/1 [==============================] - 1s 666ms/step\n",
      "1/1 [==============================] - 0s 119ms/step\n",
      "SEATTLE\n",
      "Earthquake Preparedness Brochure\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 642ms/step\n",
      "1/1 [==============================] - 0s 106ms/step\n",
      "SEATTLE\n",
      "Ethics Code Commissions Board\n",
      "2015\n",
      "2016\n",
      "1/1 [==============================] - 1s 758ms/step\n",
      "1/1 [==============================] - 0s 104ms/step\n",
      "SEATTLE\n",
      "Ethics Code Commissions Board\n",
      "2018\n",
      "2019\n",
      "1/1 [==============================] - 1s 642ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "SEATTLE\n",
      "Earthquake Preparedness Brochure\n",
      "2019\n",
      "2020\n",
      "1/1 [==============================] - 1s 606ms/step\n",
      "1/1 [==============================] - 0s 100ms/step\n",
      "SEATTLE\n",
      "Code Violation Complaint Form\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 604ms/step\n",
      "1/1 [==============================] - 0s 106ms/step\n",
      "SEATTLE\n",
      "Earthquake Preparedness Brochure\n",
      "2018\n",
      "2019\n",
      "1/1 [==============================] - 1s 682ms/step\n",
      "1/1 [==============================] - 0s 112ms/step\n",
      "SEATTLE\n",
      "Earthquake Preparedness Brochure\n",
      "2020\n",
      "2021\n",
      "1/1 [==============================] - 1s 579ms/step\n",
      "1/1 [==============================] - 0s 94ms/step\n",
      "SEATTLE\n",
      "Earthquake Preparedness Brochure\n",
      "2017\n",
      "2018\n",
      "1/1 [==============================] - 1s 600ms/step\n",
      "1/1 [==============================] - 0s 99ms/step\n",
      "SEATTLE\n",
      "Code Violation Complaint Form\n",
      "2015\n",
      "2016\n",
      "1/1 [==============================] - 1s 683ms/step\n",
      "1/1 [==============================] - 0s 107ms/step\n",
      "SEATTLE\n",
      "Code Violation Complaint Form\n",
      "2017\n",
      "2018\n",
      "1/1 [==============================] - 1s 629ms/step\n",
      "1/1 [==============================] - 0s 113ms/step\n",
      "SEATTLE\n",
      "Earthquake Preparedness Brochure\n",
      "2022\n",
      "2023\n",
      "1/1 [==============================] - 1s 638ms/step\n",
      "1/1 [==============================] - 0s 99ms/step\n",
      "SEATTLE\n",
      "Earthquake Preparedness Brochure\n",
      "2015\n",
      "2016\n",
      "1/1 [==============================] - 1s 634ms/step\n",
      "1/1 [==============================] - 0s 102ms/step\n",
      "SEATTLE\n",
      "Ethics Code Commissions Board\n",
      "2021\n",
      "2022\n",
      "1/1 [==============================] - 1s 808ms/step\n",
      "1/1 [==============================] - 0s 146ms/step\n",
      "SEATTLE\n",
      "Code Violation Complaint Form\n",
      "2019\n",
      "2020\n",
      "1/1 [==============================] - 1s 648ms/step\n",
      "1/1 [==============================] - 0s 105ms/step\n",
      "SEATTLE\n",
      "Code Violation Complaint Form\n",
      "2020\n",
      "2021\n",
      "1/1 [==============================] - 1s 639ms/step\n",
      "1/1 [==============================] - 0s 105ms/step\n",
      "SEATTLE\n",
      "Ethics Code Commissions Board\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 637ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "SEATTLE\n",
      "Ethics Code Commissions Board\n",
      "2019\n",
      "2020\n",
      "1/1 [==============================] - 1s 646ms/step\n",
      "1/1 [==============================] - 0s 108ms/step\n",
      "SEATTLE\n",
      "Code Violation Complaint Form\n",
      "2022\n",
      "2023\n",
      "1/1 [==============================] - 1s 1s/step\n",
      "1/1 [==============================] - 0s 136ms/step\n",
      "SEATTLE\n",
      "Code Violation Complaint Form\n",
      "2018\n",
      "2019\n",
      "1/1 [==============================] - 1s 634ms/step\n",
      "1/1 [==============================] - 0s 108ms/step\n",
      "SEATTLE\n",
      "Ethics Code Commissions Board\n",
      "2022\n",
      "2023\n",
      "1/1 [==============================] - 1s 704ms/step\n",
      "1/1 [==============================] - 0s 131ms/step\n",
      "SEATTLE\n",
      "Earthquake Preparedness Brochure\n",
      "2021\n",
      "2022\n",
      "1/1 [==============================] - 1s 646ms/step\n",
      "1/1 [==============================] - 0s 98ms/step\n",
      "SEATTLE\n",
      "Code Violation Complaint Form\n",
      "2021\n",
      "2022\n",
      "1/1 [==============================] - 1s 640ms/step\n",
      "1/1 [==============================] - 0s 101ms/step\n",
      "ELPASO\n",
      "Code Enforcement Information\n",
      "2017\n",
      "2018\n",
      "1/1 [==============================] - 1s 673ms/step\n",
      "1/1 [==============================] - 0s 107ms/step\n",
      "ELPASO\n",
      "Food Establishment Application\n",
      "2019\n",
      "2020\n",
      "1/1 [==============================] - 1s 674ms/step\n",
      "1/1 [==============================] - 0s 105ms/step\n",
      "ELPASO\n",
      "Code Enforcement Information\n",
      "2022\n",
      "2023\n",
      "1/1 [==============================] - 1s 654ms/step\n",
      "1/1 [==============================] - 0s 97ms/step\n",
      "ELPASO\n",
      "Code Enforcement Information\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 654ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "ELPASO\n",
      "Code Enforcement Information\n",
      "2020\n",
      "2021\n",
      "1/1 [==============================] - 1s 644ms/step\n",
      "1/1 [==============================] - 0s 94ms/step\n",
      "ELPASO\n",
      "Code Enforcement Information\n",
      "2021\n",
      "2022\n",
      "1/1 [==============================] - 1s 651ms/step\n",
      "1/1 [==============================] - 0s 105ms/step\n",
      "ELPASO\n",
      "Food Establishment Application\n",
      "2018\n",
      "2019\n",
      "1/1 [==============================] - 1s 652ms/step\n",
      "1/1 [==============================] - 0s 100ms/step\n",
      "ELPASO\n",
      "Code Enforcement Information\n",
      "2018\n",
      "2019\n",
      "1/1 [==============================] - 1s 689ms/step\n",
      "1/1 [==============================] - 0s 104ms/step\n",
      "ELPASO\n",
      "Code Enforcement Information\n",
      "2015\n",
      "2016\n",
      "1/1 [==============================] - 1s 637ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "ELPASO\n",
      "Code Enforcement Information\n",
      "2019\n",
      "2020\n",
      "1/1 [==============================] - 1s 646ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "NASHVILLE\n",
      "Online Permit Information Page\n",
      "2019\n",
      "2020\n",
      "1/1 [==============================] - 1s 655ms/step\n",
      "1/1 [==============================] - 0s 104ms/step\n",
      "NASHVILLE\n",
      "Online Permit Information Page\n",
      "2018\n",
      "2019\n",
      "1/1 [==============================] - 1s 651ms/step\n",
      "1/1 [==============================] - 0s 102ms/step\n",
      "NASHVILLE\n",
      "Online Permit Information Page\n",
      "2020\n",
      "2022\n",
      "1/1 [==============================] - 1s 861ms/step\n",
      "1/1 [==============================] - 0s 114ms/step\n",
      "NASHVILLE\n",
      "Online Permit Information Page\n",
      "2022\n",
      "2023\n",
      "1/1 [==============================] - 1s 805ms/step\n",
      "1/1 [==============================] - 0s 99ms/step\n",
      "MEMPHIS\n",
      "Parades and Public Assemblies Application\n",
      "2016\n",
      "2020\n",
      "1/1 [==============================] - 1s 621ms/step\n",
      "1/1 [==============================] - 0s 95ms/step\n",
      "MEMPHIS\n",
      "Parades and Public Assemblies Application\n",
      "2020\n",
      "2023\n",
      "1/1 [==============================] - 1s 634ms/step\n",
      "1/1 [==============================] - 0s 96ms/step\n",
      "BALTIMORE\n",
      "File a Police Report\n",
      "2019\n",
      "2023\n",
      "1/1 [==============================] - 1s 646ms/step\n",
      "1/1 [==============================] - 0s 94ms/step\n",
      "TUCSON\n",
      "Vote by Mail Locations\n",
      "2017\n",
      "2020\n",
      "1/1 [==============================] - 1s 636ms/step\n",
      "1/1 [==============================] - 0s 106ms/step\n",
      "TUCSON\n",
      "A Guide to Understanding How to File Rax Returns\n",
      "2015\n",
      "2017\n",
      "1/1 [==============================] - 1s 665ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "TUCSON\n",
      "Traffic and Pedestrian Safety Guide\n",
      "2020\n",
      "2022\n",
      "1/1 [==============================] - 1s 604ms/step\n",
      "1/1 [==============================] - 0s 85ms/step\n",
      "TUCSON\n",
      "Traffic and Pedestrian Safety Guide\n",
      "2015\n",
      "2020\n",
      "1/1 [==============================] - 1s 644ms/step\n",
      "1/1 [==============================] - 0s 87ms/step\n",
      "TUCSON\n",
      "Vote by Mail Locations\n",
      "2015\n",
      "2017\n",
      "1/1 [==============================] - 1s 836ms/step\n",
      "1/1 [==============================] - 0s 124ms/step\n",
      "TUCSON\n",
      "Business License Application\n",
      "2017\n",
      "2023\n",
      "1/1 [==============================] - 1s 633ms/step\n",
      "1/1 [==============================] - 0s 98ms/step\n",
      "TUCSON\n",
      "A Guide to Understanding How to File Rax Returns\n",
      "2017\n",
      "2023\n",
      "1/1 [==============================] - 1s 649ms/step\n",
      "1/1 [==============================] - 0s 106ms/step\n",
      "TUCSON\n",
      "Business License Application\n",
      "2015\n",
      "2017\n",
      "1/1 [==============================] - 1s 853ms/step\n",
      "1/1 [==============================] - 0s 132ms/step\n",
      "FRESNO\n",
      "Immigration Violations Policy Manual\n",
      "2021\n",
      "2022\n",
      "1/1 [==============================] - 1s 650ms/step\n",
      "1/1 [==============================] - 0s 104ms/step\n",
      "FRESNO\n",
      "Police Cadet Job Posting\n",
      "2017\n",
      "2023\n",
      "1/1 [==============================] - 1s 649ms/step\n",
      "1/1 [==============================] - 0s 99ms/step\n",
      "FRESNO\n",
      "Business Tax Certificate Application\n",
      "2015\n",
      "2023\n",
      "1/1 [==============================] - 1s 642ms/step\n",
      "1/1 [==============================] - 0s 108ms/step\n",
      "FRESNO\n",
      "Immigration Violations Policy Manual\n",
      "2019\n",
      "2021\n",
      "1/1 [==============================] - 1s 752ms/step\n",
      "1/1 [==============================] - 0s 137ms/step\n",
      "SACRAMENTO\n",
      "Initiative Petition Process Time Line\n",
      "2018\n",
      "2021\n",
      "1/1 [==============================] - 1s 645ms/step\n",
      "1/1 [==============================] - 0s 100ms/step\n",
      "SACRAMENTO\n",
      "Initiative Petition Process Time Line\n",
      "2021\n",
      "2023\n",
      "1/1 [==============================] - 1s 643ms/step\n",
      "1/1 [==============================] - 0s 99ms/step\n",
      "SACRAMENTO\n",
      "Household Junk Appliance EWaste Pickup\n",
      "2020\n",
      "2023\n",
      "1/1 [==============================] - 1s 640ms/step\n",
      "1/1 [==============================] - 0s 96ms/step\n",
      "SACRAMENTO\n",
      "Household Junk Appliance EWaste Pickup\n",
      "2016\n",
      "2020\n",
      "1/1 [==============================] - 1s 648ms/step\n",
      "1/1 [==============================] - 0s 102ms/step\n",
      "SACRAMENTO\n",
      "Resident Permit Application\n",
      "2018\n",
      "2020\n",
      "1/1 [==============================] - 1s 700ms/step\n",
      "1/1 [==============================] - 0s 105ms/step\n",
      "SACRAMENTO\n",
      "Resident Permit Application\n",
      "2020\n",
      "2023\n",
      "1/1 [==============================] - 1s 654ms/step\n",
      "1/1 [==============================] - 0s 98ms/step\n",
      "ATLANTA\n",
      "Solid Waste Service Charges FAQs\n",
      "2020\n",
      "2023\n",
      "1/1 [==============================] - 1s 649ms/step\n",
      "1/1 [==============================] - 0s 97ms/step\n",
      "ATLANTA\n",
      "Solid Waste Service Charges FAQs\n",
      "2019\n",
      "2020\n",
      "1/1 [==============================] - 1s 663ms/step\n",
      "1/1 [==============================] - 0s 102ms/step\n",
      "RALEIGH\n",
      "Recording Disclosure Request Form\n",
      "2019\n",
      "2021\n",
      "1/1 [==============================] - 1s 650ms/step\n",
      "1/1 [==============================] - 0s 110ms/step\n",
      "RALEIGH\n",
      "Recording Disclosure Request Form\n",
      "2021\n",
      "2023\n",
      "1/1 [==============================] - 1s 611ms/step\n",
      "1/1 [==============================] - 0s 95ms/step\n",
      "LONGBEACH\n",
      "Police Core Values\n",
      "2017\n",
      "2019\n",
      "1/1 [==============================] - 1s 762ms/step\n",
      "1/1 [==============================] - 0s 99ms/step\n",
      "LONGBEACH\n",
      "Police Core Values\n",
      "2019\n",
      "2022\n",
      "1/1 [==============================] - 1s 823ms/step\n",
      "1/1 [==============================] - 0s 102ms/step\n",
      "OAKLAND\n",
      "Police Public Records Request Form\n",
      "2020\n",
      "2021\n",
      "1/1 [==============================] - 1s 616ms/step\n",
      "1/1 [==============================] - 0s 101ms/step\n",
      "OAKLAND\n",
      "Police Public Records Request Form\n",
      "2015\n",
      "2016\n",
      "1/1 [==============================] - 1s 641ms/step\n",
      "1/1 [==============================] - 0s 102ms/step\n",
      "OAKLAND\n",
      "Police Public Records Request Form\n",
      "2017\n",
      "2018\n",
      "1/1 [==============================] - 1s 633ms/step\n",
      "1/1 [==============================] - 0s 102ms/step\n",
      "OAKLAND\n",
      "Police Public Records Request Form\n",
      "2021\n",
      "2022\n",
      "1/1 [==============================] - 1s 647ms/step\n",
      "1/1 [==============================] - 0s 101ms/step\n",
      "OAKLAND\n",
      "Police Public Records Request Form\n",
      "2018\n",
      "2019\n",
      "1/1 [==============================] - 1s 688ms/step\n",
      "1/1 [==============================] - 0s 106ms/step\n",
      "OAKLAND\n",
      "Police Public Records Request Form\n",
      "2019\n",
      "2020\n",
      "1/1 [==============================] - 1s 716ms/step\n",
      "1/1 [==============================] - 0s 116ms/step\n",
      "OAKLAND\n",
      "Police Public Records Request Form\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 630ms/step\n",
      "1/1 [==============================] - 0s 98ms/step\n",
      "TULSA\n",
      "Request for Public Records\n",
      "2015\n",
      "2016\n",
      "1/1 [==============================] - 1s 659ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "TULSA\n",
      "Adopt a Spot\n",
      "2015\n",
      "2016\n",
      "1/1 [==============================] - 1s 809ms/step\n",
      "1/1 [==============================] - 0s 110ms/step\n",
      "TULSA\n",
      "Recreation Center Establishment Application Form\n",
      "2015\n",
      "2016\n",
      "1/1 [==============================] - 1s 660ms/step\n",
      "1/1 [==============================] - 0s 113ms/step\n",
      "ARLINGTON\n",
      "Americans with Disability Complaint Form\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 646ms/step\n",
      "1/1 [==============================] - 0s 102ms/step\n",
      "ARLINGTON\n",
      "Burglar Alarm Permit Application\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 865ms/step\n",
      "1/1 [==============================] - 0s 114ms/step\n",
      "ARLINGTON\n",
      "Burglar Alarm Permit Application\n",
      "2015\n",
      "2016\n",
      "1/1 [==============================] - 1s 624ms/step\n",
      "1/1 [==============================] - 0s 98ms/step\n",
      "ARLINGTON\n",
      "Americans with Disability Complaint Form\n",
      "2015\n",
      "2016\n",
      "1/1 [==============================] - 1s 657ms/step\n",
      "1/1 [==============================] - 0s 116ms/step\n",
      "AURORA\n",
      "Business License Application\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 631ms/step\n",
      "1/1 [==============================] - 0s 93ms/step\n",
      "AURORA\n",
      "Candidate Committee Registration Form\n",
      "2021\n",
      "2023\n",
      "1/1 [==============================] - 1s 622ms/step\n",
      "1/1 [==============================] - 0s 101ms/step\n",
      "AURORA\n",
      "Candidate Committee Registration Form\n",
      "2016\n",
      "2021\n",
      "1/1 [==============================] - 1s 657ms/step\n",
      "1/1 [==============================] - 0s 99ms/step\n",
      "AURORA\n",
      "Commendation Form\n",
      "2016\n",
      "2020\n",
      "1/1 [==============================] - 1s 976ms/step\n",
      "1/1 [==============================] - 0s 131ms/step\n",
      "BAKERSFIELD\n",
      "Encroachment Permit Application\n",
      "2017\n",
      "2023\n",
      "1/1 [==============================] - 1s 902ms/step\n",
      "1/1 [==============================] - 0s 119ms/step\n",
      "BAKERSFIELD\n",
      "Fire Alarm Application\n",
      "2017\n",
      "2023\n",
      "1/1 [==============================] - 1s 629ms/step\n",
      "1/1 [==============================] - 0s 101ms/step\n",
      "BAKERSFIELD\n",
      "Encroachment Permit Application\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 649ms/step\n",
      "1/1 [==============================] - 0s 92ms/step\n",
      "BAKERSFIELD\n",
      "Liability Claim Form\n",
      "2017\n",
      "2023\n",
      "1/1 [==============================] - 1s 634ms/step\n",
      "1/1 [==============================] - 0s 105ms/step\n",
      "BAKERSFIELD\n",
      "Bicycle Transportation Plan\n",
      "2016\n",
      "2023\n",
      "1/1 [==============================] - 1s 657ms/step\n",
      "1/1 [==============================] - 0s 101ms/step\n",
      "ANAHEIM\n",
      "Police Volunteer Application\n",
      "2015\n",
      "2016\n",
      "1/1 [==============================] - 1s 657ms/step\n",
      "1/1 [==============================] - 0s 104ms/step\n",
      "ANAHEIM\n",
      "Contesting a Parking Ticket\n",
      "2015\n",
      "2016\n",
      "1/1 [==============================] - 1s 808ms/step\n",
      "1/1 [==============================] - 0s 133ms/step\n",
      "ANAHEIM\n",
      "Request for Public Records\n",
      "2016\n",
      "2018\n",
      "1/1 [==============================] - 1s 658ms/step\n",
      "1/1 [==============================] - 0s 106ms/step\n",
      "ANAHEIM\n",
      "Request for Public Records\n",
      "2020\n",
      "2022\n",
      "1/1 [==============================] - 1s 841ms/step\n",
      "1/1 [==============================] - 0s 121ms/step\n",
      "ANAHEIM\n",
      "Emergency Management Preparedness Webpage\n",
      "2015\n",
      "2019\n",
      "1/1 [==============================] - 1s 656ms/step\n",
      "1/1 [==============================] - 0s 107ms/step\n",
      "ANAHEIM\n",
      "Emergency Management Preparedness Webpage\n",
      "2019\n",
      "2023\n",
      "1/1 [==============================] - 1s 645ms/step\n",
      "1/1 [==============================] - 0s 102ms/step\n",
      "ANAHEIM\n",
      "Request for Public Records\n",
      "2018\n",
      "2020\n",
      "1/1 [==============================] - 1s 657ms/step\n",
      "1/1 [==============================] - 0s 105ms/step\n",
      "ANAHEIM\n",
      "Request for Public Records\n",
      "2015\n",
      "2016\n",
      "1/1 [==============================] - 1s 633ms/step\n",
      "1/1 [==============================] - 0s 104ms/step\n",
      "ANAHEIM\n",
      "Request for Public Records\n",
      "2022\n",
      "2023\n",
      "1/1 [==============================] - 1s 688ms/step\n",
      "1/1 [==============================] - 0s 113ms/step\n",
      "ANAHEIM\n",
      "Contesting a Parking Ticket\n",
      "2016\n",
      "2022\n",
      "1/1 [==============================] - 1s 641ms/step\n",
      "1/1 [==============================] - 0s 105ms/step\n",
      "ANAHEIM\n",
      "Police Volunteer Application\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 664ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "HONOLULU\n",
      "Police Commission Complaint Form\n",
      "2015\n",
      "2017\n",
      "1/1 [==============================] - 1s 645ms/step\n",
      "1/1 [==============================] - 0s 101ms/step\n",
      "HONOLULU\n",
      "Request for Offduty Officer\n",
      "2017\n",
      "2018\n",
      "1/1 [==============================] - 1s 875ms/step\n",
      "1/1 [==============================] - 0s 116ms/step\n",
      "HONOLULU\n",
      "Police Commission Complaint Form\n",
      "2017\n",
      "2020\n",
      "1/1 [==============================] - 1s 664ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "HONOLULU\n",
      "Request for Offduty Officer\n",
      "2015\n",
      "2017\n",
      "1/1 [==============================] - 1s 635ms/step\n",
      "1/1 [==============================] - 0s 104ms/step\n",
      "RIVERSIDE\n",
      "Vote by Mail Application\n",
      "2015\n",
      "2018\n",
      "1/1 [==============================] - 1s 674ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "RIVERSIDE\n",
      "Building Permit Credit Card Authorization\n",
      "2017\n",
      "2019\n",
      "1/1 [==============================] - 1s 672ms/step\n",
      "1/1 [==============================] - 0s 120ms/step\n",
      "RIVERSIDE\n",
      "Vote by Mail Application\n",
      "2018\n",
      "2022\n",
      "1/1 [==============================] - 1s 642ms/step\n",
      "1/1 [==============================] - 0s 101ms/step\n",
      "RIVERSIDE\n",
      "Building Permit Credit Card Authorization\n",
      "2015\n",
      "2017\n",
      "1/1 [==============================] - 1s 649ms/step\n",
      "1/1 [==============================] - 0s 105ms/step\n",
      "CORPUSCHRISTI\n",
      "Application for Birth and Death Record\n",
      "2017\n",
      "2021\n",
      "1/1 [==============================] - 1s 816ms/step\n",
      "1/1 [==============================] - 0s 131ms/step\n",
      "CORPUSCHRISTI\n",
      "Park Volunteering Application\n",
      "2015\n",
      "2017\n",
      "1/1 [==============================] - 1s 623ms/step\n",
      "1/1 [==============================] - 0s 99ms/step\n",
      "CORPUSCHRISTI\n",
      "Park Volunteering Application\n",
      "2017\n",
      "2023\n",
      "1/1 [==============================] - 1s 640ms/step\n",
      "1/1 [==============================] - 0s 94ms/step\n",
      "CORPUSCHRISTI\n",
      "Flu Consent Form\n",
      "2015\n",
      "2020\n",
      "1/1 [==============================] - 1s 656ms/step\n",
      "1/1 [==============================] - 0s 106ms/step\n",
      "CORPUSCHRISTI\n",
      "Flu Consent Form\n",
      "2020\n",
      "2023\n",
      "1/1 [==============================] - 1s 690ms/step\n",
      "1/1 [==============================] - 0s 100ms/step\n",
      "CORPUSCHRISTI\n",
      "Residential Building Permit Application\n",
      "2015\n",
      "2017\n",
      "1/1 [==============================] - 1s 630ms/step\n",
      "1/1 [==============================] - 0s 95ms/step\n",
      "CORPUSCHRISTI\n",
      "Application for Birth and Death Record\n",
      "2021\n",
      "2023\n",
      "1/1 [==============================] - 1s 620ms/step\n",
      "1/1 [==============================] - 0s 94ms/step\n",
      "CORPUSCHRISTI\n",
      "Residential Building Permit Application\n",
      "2017\n",
      "2022\n",
      "1/1 [==============================] - 1s 633ms/step\n",
      "1/1 [==============================] - 0s 111ms/step\n",
      "STOCKTON\n",
      "License and Microchip Information\n",
      "2018\n",
      "2020\n",
      "1/1 [==============================] - 1s 660ms/step\n",
      "1/1 [==============================] - 0s 101ms/step\n",
      "STOCKTON\n",
      "Business License Tax Application\n",
      "2017\n",
      "2021\n",
      "1/1 [==============================] - 1s 631ms/step\n",
      "1/1 [==============================] - 0s 102ms/step\n",
      "STOCKTON\n",
      "Business License Tax Application\n",
      "2015\n",
      "2017\n",
      "1/1 [==============================] - 1s 645ms/step\n",
      "1/1 [==============================] - 0s 96ms/step\n",
      "STOCKTON\n",
      "License and Microchip Information\n",
      "2020\n",
      "2023\n",
      "1/1 [==============================] - 1s 897ms/step\n",
      "1/1 [==============================] - 0s 100ms/step\n",
      "PITTSBURGH\n",
      "911 vs 311 form\n",
      "2017\n",
      "2020\n",
      "1/1 [==============================] - 1s 668ms/step\n",
      "1/1 [==============================] - 0s 99ms/step\n",
      "PITTSBURGH\n",
      "911 vs 311 form\n",
      "2020\n",
      "2023\n",
      "1/1 [==============================] - 1s 851ms/step\n",
      "1/1 [==============================] - 0s 127ms/step\n",
      "PLANO\n",
      "Alarm Permit Application\n",
      "2015\n",
      "2017\n",
      "1/1 [==============================] - 1s 626ms/step\n",
      "1/1 [==============================] - 0s 111ms/step\n",
      "IRVINE\n",
      "Instructions for Transient Occupancy Tax Return\n",
      "2020\n",
      "2023\n",
      "1/1 [==============================] - 1s 674ms/step\n",
      "1/1 [==============================] - 0s 102ms/step\n",
      "IRVINE\n",
      "Instructions for Transient Occupancy Tax Return\n",
      "2015\n",
      "2020\n",
      "1/1 [==============================] - 1s 663ms/step\n",
      "1/1 [==============================] - 0s 112ms/step\n",
      "CHULAVISTA\n",
      "Community Garden Application\n",
      "2020\n",
      "2023\n",
      "1/1 [==============================] - 1s 653ms/step\n",
      "1/1 [==============================] - 0s 105ms/step\n",
      "CHULAVISTA\n",
      "Community Garden Application\n",
      "2018\n",
      "2020\n",
      "1/1 [==============================] - 1s 660ms/step\n",
      "1/1 [==============================] - 0s 104ms/step\n",
      "TOLEDO\n",
      "Generic Tax Form\n",
      "2019\n",
      "2023\n",
      "1/1 [==============================] - 1s 637ms/step\n",
      "1/1 [==============================] - 0s 99ms/step\n",
      "TOLEDO\n",
      "Generic Tax Form\n",
      "2015\n",
      "2019\n",
      "1/1 [==============================] - 1s 702ms/step\n",
      "1/1 [==============================] - 0s 99ms/step\n",
      "LAREDO\n",
      "Building Permit Application\n",
      "2016\n",
      "2019\n",
      "1/1 [==============================] - 1s 615ms/step\n",
      "1/1 [==============================] - 0s 97ms/step\n",
      "LAREDO\n",
      "Building Permit Application\n",
      "2019\n",
      "2023\n",
      "1/1 [==============================] - 1s 610ms/step\n",
      "1/1 [==============================] - 0s 98ms/step\n",
      "MADISONWI\n",
      "Payment Center\n",
      "2016\n",
      "2020\n",
      "1/1 [==============================] - 1s 612ms/step\n",
      "1/1 [==============================] - 0s 94ms/step\n",
      "MADISONWI\n",
      "Payment Center\n",
      "2020\n",
      "2023\n",
      "1/1 [==============================] - 1s 646ms/step\n",
      "1/1 [==============================] - 0s 97ms/step\n",
      "LUBBOCK\n",
      "Class Registration Form\n",
      "2015\n",
      "2018\n",
      "1/1 [==============================] - 1s 664ms/step\n",
      "1/1 [==============================] - 0s 105ms/step\n",
      "LUBBOCK\n",
      "Alarm Permit Application\n",
      "2015\n",
      "2016\n",
      "1/1 [==============================] - 1s 655ms/step\n",
      "1/1 [==============================] - 0s 110ms/step\n",
      "LUBBOCK\n",
      "Class Registration Form\n",
      "2018\n",
      "2023\n",
      "1/1 [==============================] - 1s 657ms/step\n",
      "1/1 [==============================] - 0s 101ms/step\n",
      "RENO\n",
      "Building Permit Application\n",
      "2021\n",
      "2023\n",
      "1/1 [==============================] - 1s 653ms/step\n",
      "1/1 [==============================] - 0s 108ms/step\n",
      "RENO\n",
      "Building Permit Application\n",
      "2015\n",
      "2021\n",
      "1/1 [==============================] - 1s 885ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "GILBERT\n",
      "Hydrant Meter Construction\n",
      "2020\n",
      "2023\n",
      "1/1 [==============================] - 1s 667ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "GILBERT\n",
      "Hydrant Meter Construction\n",
      "2015\n",
      "2020\n",
      "1/1 [==============================] - 1s 645ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "CHESAPEAKE\n",
      "Waste Collection Brochure\n",
      "2015\n",
      "2019\n",
      "1/1 [==============================] - 1s 630ms/step\n",
      "1/1 [==============================] - 0s 96ms/step\n",
      "CHESAPEAKE\n",
      "Waste Collection Brochure\n",
      "2019\n",
      "2023\n",
      "1/1 [==============================] - 1s 640ms/step\n",
      "1/1 [==============================] - 0s 100ms/step\n",
      "SPOKANE\n",
      "Request for Expungement\n",
      "2015\n",
      "2020\n",
      "1/1 [==============================] - 1s 657ms/step\n",
      "1/1 [==============================] - 0s 108ms/step\n",
      "SPOKANE\n",
      "Request for Expungement\n",
      "2020\n",
      "2021\n",
      "1/1 [==============================] - 1s 681ms/step\n",
      "1/1 [==============================] - 0s 118ms/step\n",
      "TEMPE\n",
      "Vacation Notification Form\n",
      "2019\n",
      "2021\n",
      "1/1 [==============================] - 1s 850ms/step\n",
      "1/1 [==============================] - 0s 124ms/step\n",
      "TEMPE\n",
      "Vacation Notification Form\n",
      "2021\n",
      "2023\n",
      "1/1 [==============================] - 1s 626ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "GLENDALE\n",
      "Commendation Form\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 642ms/step\n",
      "1/1 [==============================] - 0s 114ms/step\n",
      "GLENDALE\n",
      "Commendation Form\n",
      "2017\n",
      "2023\n",
      "1/1 [==============================] - 1s 646ms/step\n",
      "1/1 [==============================] - 0s 106ms/step\n",
      "KNOXVILLE\n",
      "Suspicious Activity Form\n",
      "2018\n",
      "2020\n",
      "1/1 [==============================] - 1s 657ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "KNOXVILLE\n",
      "Crime Analysis Citizens Request Form\n",
      "2018\n",
      "2019\n",
      "1/1 [==============================] - 1s 666ms/step\n",
      "1/1 [==============================] - 0s 118ms/step\n",
      "KNOXVILLE\n",
      "Crime Analysis Citizens Request Form\n",
      "2019\n",
      "2023\n",
      "1/1 [==============================] - 1s 643ms/step\n",
      "1/1 [==============================] - 0s 106ms/step\n",
      "KNOXVILLE\n",
      "Suspicious Activity Form\n",
      "2020\n",
      "2023\n",
      "1/1 [==============================] - 1s 776ms/step\n",
      "1/1 [==============================] - 0s 111ms/step\n",
      "FORTCOLLINS\n",
      "Unclaimed Funds Form\n",
      "2021\n",
      "2023\n",
      "1/1 [==============================] - 1s 665ms/step\n",
      "1/1 [==============================] - 0s 100ms/step\n",
      "FORTCOLLINS\n",
      "Affordable Housing Poster\n",
      "2017\n",
      "2023\n",
      "1/1 [==============================] - 1s 637ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "FORTCOLLINS\n",
      "Affordable Housing Poster\n",
      "2015\n",
      "2017\n",
      "1/1 [==============================] - 1s 646ms/step\n",
      "1/1 [==============================] - 0s 119ms/step\n",
      "FORTCOLLINS\n",
      "Sales Tax Change Form\n",
      "2015\n",
      "2017\n",
      "1/1 [==============================] - 1s 1s/step\n",
      "1/1 [==============================] - 0s 130ms/step\n",
      "FORTCOLLINS\n",
      "Vehicle Idling Brochure\n",
      "2015\n",
      "2020\n",
      "1/1 [==============================] - 1s 660ms/step\n",
      "1/1 [==============================] - 0s 122ms/step\n",
      "FORTCOLLINS\n",
      "Unclaimed Funds Form\n",
      "2017\n",
      "2021\n",
      "1/1 [==============================] - 1s 650ms/step\n",
      "1/1 [==============================] - 0s 101ms/step\n",
      "FORTCOLLINS\n",
      "Vehicle Idling Brochure\n",
      "2020\n",
      "2023\n",
      "1/1 [==============================] - 1s 827ms/step\n",
      "1/1 [==============================] - 0s 141ms/step\n",
      "FORTCOLLINS\n",
      "Sales Tax Change Form\n",
      "2017\n",
      "2023\n",
      "1/1 [==============================] - 1s 639ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "MACONBIBB\n",
      "Business License Application\n",
      "2016\n",
      "2023\n",
      "1/1 [==============================] - 1s 645ms/step\n",
      "1/1 [==============================] - 0s 104ms/step\n",
      "MIDLAND\n",
      "Citizen Police Application Form\n",
      "2021\n",
      "2023\n",
      "1/1 [==============================] - 1s 659ms/step\n",
      "1/1 [==============================] - 0s 118ms/step\n",
      "MIDLAND\n",
      "Citizen Police Application Form\n",
      "2019\n",
      "2021\n",
      "1/1 [==============================] - 1s 648ms/step\n",
      "1/1 [==============================] - 0s 101ms/step\n",
      "SAVANNAH\n",
      "New Business Application\n",
      "2019\n",
      "2023\n",
      "1/1 [==============================] - 1s 655ms/step\n",
      "1/1 [==============================] - 0s 119ms/step\n",
      "SAVANNAH\n",
      "New Business Application\n",
      "2018\n",
      "2019\n",
      "1/1 [==============================] - 1s 639ms/step\n",
      "1/1 [==============================] - 0s 101ms/step\n",
      "THOUSANDOAKS\n",
      "Code Compliance Complaint Form\n",
      "2020\n",
      "2023\n",
      "1/1 [==============================] - 1s 663ms/step\n",
      "1/1 [==============================] - 0s 105ms/step\n",
      "THOUSANDOAKS\n",
      "Code Compliance Complaint Form\n",
      "2016\n",
      "2020\n",
      "1/1 [==============================] - 1s 676ms/step\n",
      "1/1 [==============================] - 0s 107ms/step\n",
      "COLUMBIA\n",
      "Group Home Application\n",
      "2017\n",
      "2022\n",
      "1/1 [==============================] - 1s 653ms/step\n",
      "1/1 [==============================] - 0s 119ms/step\n",
      "COLUMBIA\n",
      "Volunteer Award Nomination Form\n",
      "2021\n",
      "2023\n",
      "1/1 [==============================] - 1s 642ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "COLUMBIA\n",
      "Solar Ready Requirements\n",
      "2021\n",
      "2023\n",
      "1/1 [==============================] - 1s 791ms/step\n",
      "1/1 [==============================] - 0s 128ms/step\n",
      "COLUMBIA\n",
      "Group Home Application\n",
      "2022\n",
      "2023\n",
      "1/1 [==============================] - 1s 655ms/step\n",
      "1/1 [==============================] - 0s 104ms/step\n",
      "COLUMBIA\n",
      "Solar Ready Requirements\n",
      "2017\n",
      "2021\n",
      "1/1 [==============================] - 1s 640ms/step\n",
      "1/1 [==============================] - 0s 100ms/step\n",
      "COLUMBIA\n",
      "Volunteer Award Nomination Form\n",
      "2017\n",
      "2021\n",
      "1/1 [==============================] - 1s 712ms/step\n",
      "1/1 [==============================] - 0s 128ms/step\n",
      "ABILENE\n",
      "Citizen Complaint Form\n",
      "2015\n",
      "2019\n",
      "1/1 [==============================] - 1s 860ms/step\n",
      "1/1 [==============================] - 0s 105ms/step\n",
      "ABILENE\n",
      "Citizen Complaint Form\n",
      "2019\n",
      "2023\n",
      "1/1 [==============================] - 1s 666ms/step\n",
      "1/1 [==============================] - 0s 113ms/step\n",
      "MERIDIAN\n",
      "Withdrawal of Candidacy\n",
      "2017\n",
      "2023\n",
      "1/1 [==============================] - 1s 672ms/step\n",
      "1/1 [==============================] - 0s 99ms/step\n",
      "ROCHESTER\n",
      "Sewer and Drain License Application\n",
      "2015\n",
      "2020\n",
      "1/1 [==============================] - 1s 643ms/step\n",
      "1/1 [==============================] - 0s 97ms/step\n",
      "ROCHESTER\n",
      "Sewer and Drain License Application\n",
      "2020\n",
      "2023\n",
      "1/1 [==============================] - 1s 651ms/step\n",
      "1/1 [==============================] - 0s 97ms/step\n",
      "CAMBRIDGE\n",
      "Recreation Special Needs Program Application\n",
      "2015\n",
      "2018\n",
      "1/1 [==============================] - 1s 639ms/step\n",
      "1/1 [==============================] - 0s 105ms/step\n",
      "CAMBRIDGE\n",
      "Recreation Special Needs Program Application\n",
      "2018\n",
      "2023\n",
      "1/1 [==============================] - 1s 651ms/step\n",
      "1/1 [==============================] - 0s 101ms/step\n",
      "CAMBRIDGE\n",
      "Disability Parking Permit\n",
      "2015\n",
      "2022\n",
      "1/1 [==============================] - 1s 748ms/step\n",
      "1/1 [==============================] - 0s 120ms/step\n",
      "CAMBRIDGE\n",
      "Disability Parking Permit\n",
      "2022\n",
      "2023\n",
      "1/1 [==============================] - 1s 645ms/step\n",
      "1/1 [==============================] - 0s 100ms/step\n",
      "SUGARLAND\n",
      "Police Recruit Job Description\n",
      "2020\n",
      "2023\n",
      "1/1 [==============================] - 1s 649ms/step\n",
      "1/1 [==============================] - 0s 98ms/step\n",
      "SUGARLAND\n",
      "Police Recruit Job Description\n",
      "2015\n",
      "2020\n",
      "1/1 [==============================] - 1s 750ms/step\n",
      "1/1 [==============================] - 0s 101ms/step\n",
      "INDEPENDENCE\n",
      "Property Tax Abatement\n",
      "2015\n",
      "2020\n",
      "1/1 [==============================] - 1s 718ms/step\n",
      "1/1 [==============================] - 0s 100ms/step\n",
      "INDEPENDENCE\n",
      "Property Tax Abatement\n",
      "2020\n",
      "2023\n",
      "1/1 [==============================] - 1s 661ms/step\n",
      "1/1 [==============================] - 0s 106ms/step\n",
      "PROVO\n",
      "Events and Services Application\n",
      "2018\n",
      "2023\n",
      "1/1 [==============================] - 1s 656ms/step\n",
      "1/1 [==============================] - 0s 97ms/step\n",
      "SPRINGFIELD\n",
      "FOIA Request Form\n",
      "2016\n",
      "2019\n",
      "1/1 [==============================] - 1s 669ms/step\n",
      "1/1 [==============================] - 0s 105ms/step\n",
      "SPRINGFIELD\n",
      "FOIA Request Form\n",
      "2019\n",
      "2023\n",
      "1/1 [==============================] - 1s 840ms/step\n",
      "1/1 [==============================] - 0s 129ms/step\n",
      "MANCHESTER\n",
      "Mayor Declaration of Candidacy\n",
      "2020\n",
      "2023\n",
      "1/1 [==============================] - 1s 634ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "MANCHESTER\n",
      "Mayor Declaration of Candidacy\n",
      "2015\n",
      "2020\n",
      "1/1 [==============================] - 1s 642ms/step\n",
      "1/1 [==============================] - 0s 97ms/step\n",
      "BOULDER\n",
      "Background Check Request\n",
      "2021\n",
      "2023\n",
      "1/1 [==============================] - 1s 642ms/step\n",
      "1/1 [==============================] - 0s 98ms/step\n",
      "BOULDER\n",
      "Background Check Request\n",
      "2017\n",
      "2021\n",
      "1/1 [==============================] - 1s 659ms/step\n",
      "1/1 [==============================] - 0s 109ms/step\n",
      "GREENBAY\n",
      "Permissible Uses Form\n",
      "2019\n",
      "2023\n",
      "1/1 [==============================] - 1s 694ms/step\n",
      "1/1 [==============================] - 0s 112ms/step\n",
      "GREENBAY\n",
      "Permissible Uses Form\n",
      "2018\n",
      "2019\n",
      "1/1 [==============================] - 1s 658ms/step\n",
      "1/1 [==============================] - 0s 106ms/step\n",
      "NAMPA\n",
      "Utility Assistance Program Brochure\n",
      "2017\n",
      "2021\n",
      "1/1 [==============================] - 1s 668ms/step\n",
      "1/1 [==============================] - 0s 109ms/step\n",
      "NAMPA\n",
      "Utility Assistance Program Brochure\n",
      "2021\n",
      "2023\n",
      "1/1 [==============================] - 1s 849ms/step\n",
      "1/1 [==============================] - 0s 132ms/step\n",
      "YUMA\n",
      "Building Permit Application\n",
      "2016\n",
      "2020\n",
      "1/1 [==============================] - 1s 652ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "YUMA\n",
      "Building Permit Application\n",
      "2020\n",
      "2023\n",
      "1/1 [==============================] - 1s 660ms/step\n",
      "1/1 [==============================] - 0s 106ms/step\n",
      "KENOSHA\n",
      "Retail Theft Reporting Procedure\n",
      "2020\n",
      "2023\n",
      "1/1 [==============================] - 1s 640ms/step\n",
      "1/1 [==============================] - 0s 102ms/step\n",
      "KENOSHA\n",
      "City Assessor Frequently Asked Questions\n",
      "2020\n",
      "2023\n",
      "1/1 [==============================] - 1s 648ms/step\n",
      "1/1 [==============================] - 0s 102ms/step\n",
      "KENOSHA\n",
      "City Assessor Frequently Asked Questions\n",
      "2017\n",
      "2020\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "C:\\Users\\wooji\\anaconda3\\lib\\site-packages\\PIL\\Image.py:3167: DecompressionBombWarning: Image size (89760000 pixels) exceeds limit of 89478485 pixels, could be decompression bomb DOS attack.\n",
      "  warnings.warn(\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "1/1 [==============================] - 1s 659ms/step\n",
      "1/1 [==============================] - 0s 99ms/step\n",
      "KENOSHA\n",
      "Retail Theft Reporting Procedure\n",
      "2019\n",
      "2020\n",
      "1/1 [==============================] - 1s 657ms/step\n",
      "1/1 [==============================] - 0s 110ms/step\n",
      "OREM\n",
      "Commercial Plans Submittal Checklist\n",
      "2018\n",
      "2023\n",
      "1/1 [==============================] - 1s 648ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "O'FALLON\n",
      "Erosion Control Brochure\n",
      "2016\n",
      "2023\n",
      "1/1 [==============================] - 1s 777ms/step\n",
      "1/1 [==============================] - 0s 126ms/step\n",
      "HOOVER\n",
      "Police Recruitment Page\n",
      "2015\n",
      "2016\n",
      "1/1 [==============================] - 1s 665ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "HOOVER\n",
      "Police Recruitment Page\n",
      "2020\n",
      "2021\n",
      "1/1 [==============================] - 1s 691ms/step\n",
      "1/1 [==============================] - 0s 123ms/step\n",
      "HOOVER\n",
      "Police Recruitment Page\n",
      "2017\n",
      "2019\n",
      "1/1 [==============================] - 1s 647ms/step\n",
      "1/1 [==============================] - 0s 104ms/step\n",
      "HOOVER\n",
      "Water Conservation Standards\n",
      "2020\n",
      "2021\n",
      "1/1 [==============================] - 1s 656ms/step\n",
      "1/1 [==============================] - 0s 99ms/step\n",
      "HOOVER\n",
      "Water Conservation Standards\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 847ms/step\n",
      "1/1 [==============================] - 0s 104ms/step\n",
      "HOOVER\n",
      "Request for Appearance\n",
      "2015\n",
      "2018\n",
      "1/1 [==============================] - 1s 654ms/step\n",
      "1/1 [==============================] - 0s 101ms/step\n",
      "HOOVER\n",
      "Police Recruitment Page\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 853ms/step\n",
      "1/1 [==============================] - 0s 126ms/step\n",
      "HOOVER\n",
      "Police Recruitment Page\n",
      "2021\n",
      "2022\n",
      "1/1 [==============================] - 1s 649ms/step\n",
      "1/1 [==============================] - 0s 99ms/step\n",
      "HOOVER\n",
      "Police Recruitment Page\n",
      "2022\n",
      "2023\n",
      "1/1 [==============================] - 1s 818ms/step\n",
      "1/1 [==============================] - 0s 131ms/step\n",
      "HOOVER\n",
      "Water Conservation Standards\n",
      "2022\n",
      "2023\n",
      "1/1 [==============================] - 1s 654ms/step\n",
      "1/1 [==============================] - 0s 104ms/step\n",
      "HOOVER\n",
      "Police Recruitment Page\n",
      "2019\n",
      "2020\n",
      "1/1 [==============================] - 1s 835ms/step\n",
      "1/1 [==============================] - 0s 128ms/step\n",
      "HOOVER\n",
      "Water Conservation Standards\n",
      "2017\n",
      "2020\n",
      "1/1 [==============================] - 1s 649ms/step\n",
      "1/1 [==============================] - 0s 102ms/step\n",
      "HOOVER\n",
      "Water Conservation Standards\n",
      "2021\n",
      "2022\n",
      "1/1 [==============================] - 1s 834ms/step\n",
      "1/1 [==============================] - 0s 128ms/step\n",
      "HOOVER\n",
      "Request for Appearance\n",
      "2018\n",
      "2022\n",
      "1/1 [==============================] - 1s 860ms/step\n",
      "1/1 [==============================] - 0s 107ms/step\n",
      "HOOVER\n",
      "Water Conservation Standards\n",
      "2015\n",
      "2016\n",
      "1/1 [==============================] - 1s 712ms/step\n",
      "1/1 [==============================] - 0s 109ms/step\n",
      "BLOOMINGTON\n",
      "Police Application\n",
      "2017\n",
      "2018\n",
      "1/1 [==============================] - 1s 657ms/step\n",
      "1/1 [==============================] - 0s 94ms/step\n",
      "BLOOMINGTON\n",
      "Tax Abatement Program\n",
      "2017\n",
      "2018\n",
      "1/1 [==============================] - 1s 627ms/step\n",
      "1/1 [==============================] - 0s 94ms/step\n",
      "BLOOMINGTON\n",
      "Police Application\n",
      "2021\n",
      "2022\n",
      "1/1 [==============================] - 1s 669ms/step\n",
      "1/1 [==============================] - 0s 92ms/step\n",
      "BLOOMINGTON\n",
      "Police Application\n",
      "2015\n",
      "2016\n",
      "1/1 [==============================] - 1s 608ms/step\n",
      "1/1 [==============================] - 0s 90ms/step\n",
      "BLOOMINGTON\n",
      "Police Application\n",
      "2022\n",
      "2023\n",
      "1/1 [==============================] - 1s 850ms/step\n",
      "1/1 [==============================] - 0s 117ms/step\n",
      "BLOOMINGTON\n",
      "Police Application\n",
      "2018\n",
      "2019\n",
      "1/1 [==============================] - 1s 696ms/step\n",
      "1/1 [==============================] - 0s 128ms/step\n",
      "BLOOMINGTON\n",
      "Tax Abatement Program\n",
      "2018\n",
      "2019\n",
      "1/1 [==============================] - 1s 626ms/step\n",
      "1/1 [==============================] - 0s 98ms/step\n",
      "BLOOMINGTON\n",
      "Police Application\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 634ms/step\n",
      "1/1 [==============================] - 0s 92ms/step\n",
      "BLOOMINGTON\n",
      "Police Application\n",
      "2019\n",
      "2021\n",
      "1/1 [==============================] - 1s 685ms/step\n",
      "1/1 [==============================] - 0s 114ms/step\n",
      "BLOOMINGTON\n",
      "Tax Abatement Program\n",
      "2022\n",
      "2023\n",
      "1/1 [==============================] - 1s 650ms/step\n",
      "1/1 [==============================] - 0s 97ms/step\n",
      "BLOOMINGTON\n",
      "Tax Abatement Program\n",
      "2021\n",
      "2022\n",
      "1/1 [==============================] - 1s 710ms/step\n",
      "1/1 [==============================] - 0s 128ms/step\n",
      "BLOOMINGTON\n",
      "Tax Abatement Program\n",
      "2019\n",
      "2021\n",
      "1/1 [==============================] - 1s 640ms/step\n",
      "1/1 [==============================] - 0s 106ms/step\n",
      "SANTAFE\n",
      "Police Recruitment Packet\n",
      "2016\n",
      "2023\n",
      "1/1 [==============================] - 1s 774ms/step\n",
      "1/1 [==============================] - 0s 100ms/step\n",
      "SANTAFE\n",
      "Low Income Adjustment\n",
      "2022\n",
      "2023\n",
      "1/1 [==============================] - 1s 670ms/step\n",
      "1/1 [==============================] - 0s 100ms/step\n",
      "SANTAFE\n",
      "Donation Form\n",
      "2020\n",
      "2021\n",
      "1/1 [==============================] - 1s 825ms/step\n",
      "1/1 [==============================] - 0s 137ms/step\n",
      "SANTAFE\n",
      "Low Income Adjustment\n",
      "2015\n",
      "2020\n",
      "1/1 [==============================] - 1s 636ms/step\n",
      "1/1 [==============================] - 0s 101ms/step\n",
      "SANTAFE\n",
      "Donation Form\n",
      "2017\n",
      "2020\n",
      "1/1 [==============================] - 1s 893ms/step\n",
      "1/1 [==============================] - 0s 124ms/step\n",
      "SANTAFE\n",
      "Low Income Adjustment\n",
      "2020\n",
      "2022\n",
      "1/1 [==============================] - 1s 646ms/step\n",
      "1/1 [==============================] - 0s 110ms/step\n",
      "SANTAFE\n",
      "Donation Form\n",
      "2021\n",
      "2022\n",
      "1/1 [==============================] - 1s 654ms/step\n",
      "1/1 [==============================] - 0s 104ms/step\n",
      "BLOOMINGTON\n",
      "Construction Guidelines\n",
      "2015\n",
      "2016\n",
      "1/1 [==============================] - 1s 788ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "BLOOMINGTON\n",
      "Construction Guidelines\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 656ms/step\n",
      "1/1 [==============================] - 0s 100ms/step\n",
      "BLOOMINGTON\n",
      "Construction Guidelines\n",
      "2017\n",
      "2021\n",
      "1/1 [==============================] - 1s 657ms/step\n",
      "1/1 [==============================] - 0s 96ms/step\n",
      "DANBURY\n",
      "Early Childhood Brochure\n",
      "2017\n",
      "2020\n",
      "1/1 [==============================] - 1s 659ms/step\n",
      "1/1 [==============================] - 0s 105ms/step\n",
      "SOMERVILLE\n",
      "Residency Affadavit\n",
      "2018\n",
      "2021\n",
      "1/1 [==============================] - 1s 642ms/step\n",
      "1/1 [==============================] - 0s 110ms/step\n",
      "LAWRENCE\n",
      "Player Form\n",
      "2015\n",
      "2017\n",
      "1/1 [==============================] - 1s 693ms/step\n",
      "1/1 [==============================] - 0s 108ms/step\n",
      "LAWRENCE\n",
      "Player Form\n",
      "2017\n",
      "2023\n",
      "1/1 [==============================] - 1s 843ms/step\n",
      "1/1 [==============================] - 0s 125ms/step\n",
      "LAWRENCE\n",
      "City Charter\n",
      "2021\n",
      "2023\n",
      "1/1 [==============================] - 1s 840ms/step\n",
      "1/1 [==============================] - 0s 119ms/step\n",
      "LAWRENCE\n",
      "City Charter\n",
      "2015\n",
      "2021\n",
      "1/1 [==============================] - 1s 811ms/step\n",
      "1/1 [==============================] - 0s 116ms/step\n",
      "PLYMOUTH\n",
      "Property Tax Exemption\n",
      "2017\n",
      "2022\n",
      "1/1 [==============================] - 1s 660ms/step\n",
      "1/1 [==============================] - 0s 107ms/step\n",
      "PLYMOUTH\n",
      "Property Tax Exemption\n",
      "2022\n",
      "2023\n",
      "1/1 [==============================] - 1s 670ms/step\n",
      "1/1 [==============================] - 0s 105ms/step\n",
      "PLYMOUTH\n",
      "Property Tax Exemption\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 706ms/step\n",
      "1/1 [==============================] - 0s 106ms/step\n",
      "SOUTHJORDAN\n",
      "Employee Benefits Guide\n",
      "2016\n",
      "2018\n",
      "1/1 [==============================] - 1s 796ms/step\n",
      "1/1 [==============================] - 0s 107ms/step\n",
      "SOUTHJORDAN\n",
      "Employee Benefits Guide\n",
      "2020\n",
      "2022\n",
      "1/1 [==============================] - 1s 654ms/step\n",
      "1/1 [==============================] - 0s 101ms/step\n",
      "SOUTHJORDAN\n",
      "Employee Benefits Guide\n",
      "2022\n",
      "2023\n",
      "1/1 [==============================] - 1s 823ms/step\n",
      "1/1 [==============================] - 0s 116ms/step\n",
      "SOUTHJORDAN\n",
      "Employee Benefits Guide\n",
      "2018\n",
      "2020\n",
      "1/1 [==============================] - 1s 876ms/step\n",
      "1/1 [==============================] - 0s 102ms/step\n",
      "MISSOULA\n",
      "Mayor Schedule Request\n",
      "2019\n",
      "2020\n",
      "1/1 [==============================] - 1s 673ms/step\n",
      "1/1 [==============================] - 0s 97ms/step\n",
      "MISSOULA\n",
      "Pothole Report Form\n",
      "2017\n",
      "2018\n",
      "1/1 [==============================] - 1s 657ms/step\n",
      "1/1 [==============================] - 0s 118ms/step\n",
      "MISSOULA\n",
      "Mayor Schedule Request\n",
      "2020\n",
      "2021\n",
      "1/1 [==============================] - 1s 656ms/step\n",
      "1/1 [==============================] - 0s 98ms/step\n",
      "MISSOULA\n",
      "Pothole Report Form\n",
      "2015\n",
      "2016\n",
      "1/1 [==============================] - 1s 806ms/step\n",
      "1/1 [==============================] - 0s 106ms/step\n",
      "MISSOULA\n",
      "Mayor Schedule Request\n",
      "2021\n",
      "2022\n",
      "1/1 [==============================] - 1s 682ms/step\n",
      "1/1 [==============================] - 0s 106ms/step\n",
      "MISSOULA\n",
      "Pothole Report Form\n",
      "2018\n",
      "2023\n",
      "1/1 [==============================] - 1s 656ms/step\n",
      "1/1 [==============================] - 0s 110ms/step\n",
      "MISSOULA\n",
      "Pothole Report Form\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 825ms/step\n",
      "1/1 [==============================] - 0s 128ms/step\n",
      "FLAGSTAFF\n",
      "Discrimination Complaint Form\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 646ms/step\n",
      "1/1 [==============================] - 0s 98ms/step\n",
      "FLAGSTAFF\n",
      "Graffiti Removal Volunteer Form\n",
      "2017\n",
      "2022\n",
      "1/1 [==============================] - 1s 665ms/step\n",
      "1/1 [==============================] - 0s 123ms/step\n",
      "FLAGSTAFF\n",
      "Discrimination Complaint Form\n",
      "2015\n",
      "2016\n",
      "1/1 [==============================] - 1s 667ms/step\n",
      "1/1 [==============================] - 0s 104ms/step\n",
      "FLAGSTAFF\n",
      "Discrimination Complaint Form\n",
      "2020\n",
      "2021\n",
      "1/1 [==============================] - 1s 877ms/step\n",
      "1/1 [==============================] - 0s 109ms/step\n",
      "FLAGSTAFF\n",
      "Graffiti Removal Volunteer Form\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 643ms/step\n",
      "1/1 [==============================] - 0s 101ms/step\n",
      "FLAGSTAFF\n",
      "Discrimination Complaint Form\n",
      "2017\n",
      "2020\n",
      "1/1 [==============================] - 1s 869ms/step\n",
      "1/1 [==============================] - 0s 125ms/step\n",
      "FLAGSTAFF\n",
      "Discrimination Complaint Form\n",
      "2021\n",
      "2022\n",
      "1/1 [==============================] - 1s 666ms/step\n",
      "1/1 [==============================] - 0s 109ms/step\n",
      "LEHI\n",
      "New Resident Utility Application\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 658ms/step\n",
      "1/1 [==============================] - 0s 113ms/step\n",
      "LEHI\n",
      "Volunteer Application\n",
      "2018\n",
      "2020\n",
      "1/1 [==============================] - 1s 648ms/step\n",
      "1/1 [==============================] - 0s 113ms/step\n",
      "LEHI\n",
      "Volunteer Application\n",
      "2016\n",
      "2018\n",
      "1/1 [==============================] - 1s 633ms/step\n",
      "1/1 [==============================] - 0s 101ms/step\n",
      "LEHI\n",
      "Volunteer Application\n",
      "2020\n",
      "2021\n",
      "1/1 [==============================] - 1s 644ms/step\n",
      "1/1 [==============================] - 0s 96ms/step\n",
      "LEHI\n",
      "New Resident Utility Application\n",
      "2017\n",
      "2018\n",
      "1/1 [==============================] - 1s 841ms/step\n",
      "1/1 [==============================] - 0s 136ms/step\n",
      "DOTHAN\n",
      "Recycle Registration Form\n",
      "2015\n",
      "2019\n",
      "1/1 [==============================] - 1s 647ms/step\n",
      "1/1 [==============================] - 0s 105ms/step\n",
      "DOTHAN\n",
      "Recycle Registration Form\n",
      "2019\n",
      "2023\n",
      "1/1 [==============================] - 1s 648ms/step\n",
      "1/1 [==============================] - 0s 106ms/step\n",
      "JOHNSON\n",
      "New Construction Addressing\n",
      "2015\n",
      "2016\n",
      "1/1 [==============================] - 1s 630ms/step\n",
      "1/1 [==============================] - 0s 99ms/step\n",
      "JOHNSON\n",
      "New Construction Addressing\n",
      "2016\n",
      "2017\n",
      "1/1 [==============================] - 1s 655ms/step\n",
      "1/1 [==============================] - 0s 109ms/step\n",
      "JOHNSON\n",
      "New Construction Addressing\n",
      "2017\n",
      "2018\n",
      "1/1 [==============================] - 1s 654ms/step\n",
      "1/1 [==============================] - 0s 105ms/step\n",
      "CHEYENNE\n",
      "Unacceptable Driving Criteria\n",
      "2020\n",
      "2021\n",
      "1/1 [==============================] - 1s 787ms/step\n",
      "1/1 [==============================] - 0s 107ms/step\n",
      "CHEYENNE\n",
      "Unacceptable Driving Criteria\n",
      "2015\n",
      "2020\n",
      "1/1 [==============================] - 1s 649ms/step\n",
      "1/1 [==============================] - 0s 106ms/step\n",
      "GRANDJUNCTION\n",
      "Certificate of Taxes Due\n",
      "2017\n",
      "2023\n",
      "1/1 [==============================] - 1s 650ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "SOUTHAVEN\n",
      "Mayors Office FAQs\n",
      "2020\n",
      "2023\n",
      "1/1 [==============================] - 1s 677ms/step\n",
      "1/1 [==============================] - 0s 102ms/step\n",
      "SOUTHAVEN\n",
      "Mayors Office FAQs\n",
      "2016\n",
      "2020\n",
      "1/1 [==============================] - 1s 729ms/step\n",
      "1/1 [==============================] - 0s 109ms/step\n",
      "SMYRNA\n",
      "Service Request Form\n",
      "2017\n",
      "2018\n",
      "1/1 [==============================] - 1s 656ms/step\n",
      "1/1 [==============================] - 0s 105ms/step\n",
      "SMYRNA\n",
      "Service Request Form\n",
      "2018\n",
      "2023\n",
      "1/1 [==============================] - 1s 642ms/step\n",
      "1/1 [==============================] - 0s 105ms/step\n",
      "SMYRNA\n",
      "Utilities FAQs\n",
      "2019\n",
      "2020\n",
      "1/1 [==============================] - 1s 867ms/step\n",
      "1/1 [==============================] - 0s 125ms/step\n",
      "SMYRNA\n",
      "Utilities FAQs\n",
      "2020\n",
      "2023\n",
      "1/1 [==============================] - 1s 719ms/step\n",
      "1/1 [==============================] - 0s 108ms/step\n",
      "MADISONAL\n",
      "Home Buisness Application\n",
      "2019\n",
      "2023\n",
      "1/1 [==============================] - 1s 672ms/step\n",
      "1/1 [==============================] - 0s 100ms/step\n",
      "MADISONAL\n",
      "Plumbing Permit\n",
      "2020\n",
      "2023\n",
      "1/1 [==============================] - 1s 708ms/step\n",
      "1/1 [==============================] - 0s 105ms/step\n",
      "MADISONAL\n",
      "Plumbing Permit\n",
      "2019\n",
      "2020\n",
      "1/1 [==============================] - 1s 669ms/step\n",
      "1/1 [==============================] - 0s 97ms/step\n",
      "MADISONAL\n",
      "Home Buisness Application\n",
      "2018\n",
      "2019\n",
      "1/1 [==============================] - 1s 709ms/step\n",
      "1/1 [==============================] - 0s 121ms/step\n",
      "SPRINGHILL\n",
      "EBilling Form\n",
      "2019\n",
      "2020\n",
      "1/1 [==============================] - 1s 863ms/step\n",
      "1/1 [==============================] - 0s 135ms/step\n",
      "SPRINGHILL\n",
      "EBilling Form\n",
      "2020\n",
      "2023\n",
      "1/1 [==============================] - 1s 670ms/step\n",
      "1/1 [==============================] - 0s 109ms/step\n",
      "BILOXI\n",
      "Fee Schedule\n",
      "2015\n",
      "2020\n",
      "1/1 [==============================] - 1s 636ms/step\n",
      "1/1 [==============================] - 0s 103ms/step\n",
      "BILOXI\n",
      "Fee Schedule\n",
      "2020\n",
      "2023\n",
      "1/1 [==============================] - 1s 869ms/step\n",
      "1/1 [==============================] - 0s 134ms/step\n"
     ]
    }
   ],
   "source": [
    "cos_txt_sim_list = []\n",
    "cos_gfx_sim_list = []\n",
    "for idx in range(len(forms_data)):\n",
    "    print(forms_data.loc[idx,'city'])\n",
    "    print(forms_data.loc[idx,'form'])\n",
    "    print(forms_data.loc[idx,'year1'])\n",
    "    print(forms_data.loc[idx,'year2'])\n",
    "    folder1 = \"data/forms/\"+forms_data.loc[idx,'city']+\"/\" + forms_data.loc[idx,'form']+\"/\"+str(forms_data.loc[idx,'year1'])\n",
    "    folder2 = \"data/forms/\"+forms_data.loc[idx,'city']+\"/\" + forms_data.loc[idx,'form']+\"/\"+str(forms_data.loc[idx,'year2'])\n",
    "    form1 = os.listdir(folder1)\n",
    "    form2 = os.listdir(folder2)\n",
    "    cos_txt_sim, cos_gfx_sim = sim(folder1 +\"/\"+form1[0], folder2 +\"/\"+form2[0])\n",
    "    cos_txt_sim_list = cos_txt_sim_list + [cos_txt_sim]\n",
    "    cos_gfx_sim_list = cos_gfx_sim_list + [cos_gfx_sim]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "6fd605e2-54ef-4673-ae2c-0ec1e6e17e4c",
   "metadata": {},
   "outputs": [],
   "source": [
    "forms_data['cos_txt_sim']=pd.DataFrame(cos_txt_sim_list)\n",
    "forms_data['cos_gfx_sim']=pd.DataFrame(cos_gfx_sim_list)\n",
    "forms_data['cos_sim']=(forms_data['cos_txt_sim']+forms_data['cos_gfx_sim'])/2"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "id": "63e626e8-f0a7-4502-af02-a9798e0dcf49",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>index</th>\n",
       "      <th>city</th>\n",
       "      <th>form</th>\n",
       "      <th>year1</th>\n",
       "      <th>year2</th>\n",
       "      <th>cityid</th>\n",
       "      <th>trialnumber</th>\n",
       "      <th>insample</th>\n",
       "      <th>matchcityid</th>\n",
       "      <th>comm_preexisted</th>\n",
       "      <th>sim_cos</th>\n",
       "      <th>cos_txt_sim</th>\n",
       "      <th>cos_gfx_sim</th>\n",
       "      <th>cos_sim2</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>20</td>\n",
       "      <td>PHILADELPHIA</td>\n",
       "      <td>Homestead Exemption Application</td>\n",
       "      <td>2015</td>\n",
       "      <td>2020</td>\n",
       "      <td>7</td>\n",
       "      <td>2017073</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>0.848329</td>\n",
       "      <td>0.897526</td>\n",
       "      <td>0.799132</td>\n",
       "      <td>0.848329</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>21</td>\n",
       "      <td>PHILADELPHIA</td>\n",
       "      <td>Homestead Exemption Application</td>\n",
       "      <td>2020</td>\n",
       "      <td>2023</td>\n",
       "      <td>7</td>\n",
       "      <td>2017073</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>1.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>22</td>\n",
       "      <td>SANANTONIO</td>\n",
       "      <td>PD Property Loss Report</td>\n",
       "      <td>2015</td>\n",
       "      <td>2016</td>\n",
       "      <td>8</td>\n",
       "      <td>2017023</td>\n",
       "      <td>0</td>\n",
       "      <td>19</td>\n",
       "      <td>0</td>\n",
       "      <td>0.998256</td>\n",
       "      <td>0.998944</td>\n",
       "      <td>0.997568</td>\n",
       "      <td>0.998256</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>23</td>\n",
       "      <td>SANANTONIO</td>\n",
       "      <td>Fire Drill Requirements</td>\n",
       "      <td>2017</td>\n",
       "      <td>2020</td>\n",
       "      <td>8</td>\n",
       "      <td>2018024</td>\n",
       "      <td>0</td>\n",
       "      <td>19</td>\n",
       "      <td>1</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>1.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>24</td>\n",
       "      <td>SANANTONIO</td>\n",
       "      <td>Fire Drill Requirements</td>\n",
       "      <td>2015</td>\n",
       "      <td>2016</td>\n",
       "      <td>8</td>\n",
       "      <td>2018024</td>\n",
       "      <td>0</td>\n",
       "      <td>19</td>\n",
       "      <td>1</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>1.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>370</th>\n",
       "      <td>483</td>\n",
       "      <td>MADISONAL</td>\n",
       "      <td>Home Buisness Application</td>\n",
       "      <td>2018</td>\n",
       "      <td>2019</td>\n",
       "      <td>1240</td>\n",
       "      <td>2016015</td>\n",
       "      <td>0</td>\n",
       "      <td>266</td>\n",
       "      <td>0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>1.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>371</th>\n",
       "      <td>484</td>\n",
       "      <td>SPRINGHILL</td>\n",
       "      <td>EBilling Form</td>\n",
       "      <td>2019</td>\n",
       "      <td>2020</td>\n",
       "      <td>1409</td>\n",
       "      <td>2016059</td>\n",
       "      <td>0</td>\n",
       "      <td>123</td>\n",
       "      <td>0</td>\n",
       "      <td>0.975026</td>\n",
       "      <td>0.972284</td>\n",
       "      <td>0.977767</td>\n",
       "      <td>0.975026</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>372</th>\n",
       "      <td>485</td>\n",
       "      <td>SPRINGHILL</td>\n",
       "      <td>EBilling Form</td>\n",
       "      <td>2020</td>\n",
       "      <td>2023</td>\n",
       "      <td>1409</td>\n",
       "      <td>2016059</td>\n",
       "      <td>0</td>\n",
       "      <td>123</td>\n",
       "      <td>0</td>\n",
       "      <td>0.781018</td>\n",
       "      <td>0.848641</td>\n",
       "      <td>0.713394</td>\n",
       "      <td>0.781018</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>373</th>\n",
       "      <td>486</td>\n",
       "      <td>BILOXI</td>\n",
       "      <td>Fee Schedule</td>\n",
       "      <td>2015</td>\n",
       "      <td>2020</td>\n",
       "      <td>1411</td>\n",
       "      <td>2016019</td>\n",
       "      <td>0</td>\n",
       "      <td>266</td>\n",
       "      <td>0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>1.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>374</th>\n",
       "      <td>487</td>\n",
       "      <td>BILOXI</td>\n",
       "      <td>Fee Schedule</td>\n",
       "      <td>2020</td>\n",
       "      <td>2023</td>\n",
       "      <td>1411</td>\n",
       "      <td>2016019</td>\n",
       "      <td>0</td>\n",
       "      <td>266</td>\n",
       "      <td>0</td>\n",
       "      <td>0.997218</td>\n",
       "      <td>0.997481</td>\n",
       "      <td>0.996955</td>\n",
       "      <td>0.997218</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>375 rows × 14 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "     index          city                             form  year1  year2  \\\n",
       "0       20  PHILADELPHIA  Homestead Exemption Application   2015   2020   \n",
       "1       21  PHILADELPHIA  Homestead Exemption Application   2020   2023   \n",
       "2       22    SANANTONIO          PD Property Loss Report   2015   2016   \n",
       "3       23    SANANTONIO          Fire Drill Requirements   2017   2020   \n",
       "4       24    SANANTONIO          Fire Drill Requirements   2015   2016   \n",
       "..     ...           ...                              ...    ...    ...   \n",
       "370    483     MADISONAL        Home Buisness Application   2018   2019   \n",
       "371    484    SPRINGHILL                    EBilling Form   2019   2020   \n",
       "372    485    SPRINGHILL                    EBilling Form   2020   2023   \n",
       "373    486        BILOXI                     Fee Schedule   2015   2020   \n",
       "374    487        BILOXI                     Fee Schedule   2020   2023   \n",
       "\n",
       "     cityid  trialnumber  insample  matchcityid  comm_preexisted   sim_cos  \\\n",
       "0         7      2017073         0            1                0  0.848329   \n",
       "1         7      2017073         0            1                0  1.000000   \n",
       "2         8      2017023         0           19                0  0.998256   \n",
       "3         8      2018024         0           19                1  1.000000   \n",
       "4         8      2018024         0           19                1  1.000000   \n",
       "..      ...          ...       ...          ...              ...       ...   \n",
       "370    1240      2016015         0          266                0  1.000000   \n",
       "371    1409      2016059         0          123                0  0.975026   \n",
       "372    1409      2016059         0          123                0  0.781018   \n",
       "373    1411      2016019         0          266                0  1.000000   \n",
       "374    1411      2016019         0          266                0  0.997218   \n",
       "\n",
       "     cos_txt_sim  cos_gfx_sim  cos_sim2  \n",
       "0       0.897526     0.799132  0.848329  \n",
       "1       1.000000     1.000000  1.000000  \n",
       "2       0.998944     0.997568  0.998256  \n",
       "3       1.000000     1.000000  1.000000  \n",
       "4       1.000000     1.000000  1.000000  \n",
       "..           ...          ...       ...  \n",
       "370     1.000000     1.000000  1.000000  \n",
       "371     0.972284     0.977767  0.975026  \n",
       "372     0.848641     0.713394  0.781018  \n",
       "373     1.000000     1.000000  1.000000  \n",
       "374     0.997481     0.996955  0.997218  \n",
       "\n",
       "[375 rows x 14 columns]"
      ]
     },
     "execution_count": 20,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "forms_data"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.9"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
